package com.zhang.spark_1.spark_core.operator.transform

import org.apache.spark.rdd.RDD
import org.apache.spark.{SparkConf, SparkContext}

/**
 * @title:
 * @author: zhang
 * @date: 2021/12/5 18:51 
 */
object Spark01_RDD_Operator_Transform_Test {

  def main(args: Array[String]): Unit = {
    //获取spark的连接
    val conf: SparkConf = new SparkConf().setMaster("local[*]").setAppName("operator")
    val sc: SparkContext = new SparkContext(conf)
    //TODO map算子---从服务器日志数据apache.log中获取用户请求URL资源路径

    val rdd: RDD[String] = sc.textFile("datas/apache.log")

    val rddMap: RDD[String] = rdd.map(
      line => {
        val datas: Array[String] = line.split(" ")
        datas(6)
      }
    )

    rddMap.collect().foreach(println)
    sc.stop()
  }
}
